FROM python:3.10-slim

WORKDIR /app

COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt && \
    pip install --no-cache-dir scrapyd scrapydweb logparser

# 安装浏览器相关依赖
RUN apt-get update && apt-get install -y \
    wget \
    gnupg \
    fonts-liberation \
    libasound2 \
    libatk-bridge2.0-0 \
    libatk1.0-0 \
    libatspi2.0-0 \
    libcups2 \
    libdbus-1-3 \
    libdrm2 \
    libgbm1 \
    libgtk-3-0 \
    libnspr4 \
    libnss3 \
    libwayland-client0 \
    libxcomposite1 \
    libxdamage1 \
    libxfixes3 \
    libxkbcommon0 \
    libxrandr2 \
    xdg-utils \
    && rm -rf /var/lib/apt/lists/*

# 安装 playwright 浏览器
RUN playwright install chromium

# 配置 scrapyd
COPY docker/scrapyd.conf /etc/scrapyd/scrapyd.conf

# 创建必要的目录
RUN mkdir -p /app/logs /app/eggs /app/src

EXPOSE 6800

CMD ["scrapyd"] 